1 ggpubr

1.1 options & settings

For scrollable output

options(scipen = 999)

1.3 Loading libs

# install.packages("gapminder")
library(tidyverse)
library(ggpubr)
library(gapminder)

1.4 creating theme_viny_bright

theme_viny_bright <- function(){
  
  library(ggthemes)
  
  ggthemes::theme_fivethirtyeight() %+replace%
  
  theme(
    axis.title = element_text(),
    
    axis.text = element_text(size = 13),
    
    legend.text = element_text(size = 10),
    
    panel.background = element_rect(fill = "white"),
    
    plot.background = element_rect(fill = "white"),
    
    strip.background = element_blank(),
    
    legend.background = element_rect(fill = NA),
    
    legend.key = element_rect(fill = NA),

    plot.title = element_text(hjust = 0.5,
                              size = 19,
                              face = "bold"),
    plot.subtitle = element_text(hjust = 0.5, colour = "maroon")
      )
  
  }

1.5 Loading gapminder lib data

gapminder %>% head()
gapminder %>% glimpse()
Rows: 1,704
Columns: 6
$ country   <fct> Afghanistan, Afghanistan, Afghanistan, Afghanistan, Afghanistan, Afghanistan, Afgh...
$ continent <fct> Asia, Asia, Asia, Asia, Asia, Asia, Asia, Asia, Asia, Asia, Asia, Asia, Europe, Eu...
$ year      <int> 1952, 1957, 1962, 1967, 1972, 1977, 1982, 1987, 1992, 1997, 2002, 2007, 1952, 1957...
$ lifeExp   <dbl> 28.801, 30.332, 31.997, 34.020, 36.088, 38.438, 39.854, 40.822, 41.674, 41.763, 42...
$ pop       <int> 8425333, 9240934, 10267083, 11537966, 13079460, 14880372, 12881816, 13867957, 1631...
$ gdpPercap <dbl> 779.4453, 820.8530, 853.1007, 836.1971, 739.9811, 786.1134, 978.0114, 852.3959, 64...
attach(gapminder)

1.5.1 Boxplot within Violin & more

violin_plot1 <- gapminder %>% filter(year == max(year)) %>% 
  
  ggpubr::ggviolin(., x = "continent", y = "gdpPercap", 
                   fill = "continent", color = "continent", 
                   add = "boxplot", add.params = list(fill = "white", shape = "continent"))

set_palette(violin_plot1, palette = "jco")

violin_plot2 <- gapminder %>% filter(year == max(year)) %>% 
  
  ggpubr::ggviolin(., x = "continent", y = "gdpPercap", 
                   color = "continent", 
                   add = "point")

set_palette(violin_plot2, palette = "jco")

violin_plot3 <- gapminder %>% filter(year == max(year)) %>% 
  
  ggpubr::ggviolin(., x = "continent", y = "gdpPercap", 
                   color = "continent", 
                   add = "point")

set_palette(violin_plot3, palette = "jco")

violin_plot4 <- gapminder %>% filter(year == max(year)) %>% 
  
  ggpubr::ggviolin(., x = "continent", y = "gdpPercap", 
                   color = "continent", 
                   add = "jitter")

set_palette(violin_plot4, palette = "jco")

1.6 Loading latest gapminder data

gapminder_new <- read_csv("E:/3. R/gapminder data/income - gdppercap/gdppercapita_us_inflation_adjusted.csv")

head(gapminder_new)
dim(gapminder_new)
[1] 191  61
gapminder_new %>% select(country,"2010","2014","2017","2019") %>% head()
gap_longer <- gapminder_new %>% 
  pivot_longer(cols = !country, names_to = "year", values_to = "gdpPercap") 

gap_longer %>% head()
dim(gap_longer)
[1] 11460     3
gap_longer <- gap_longer %>% mutate(year = as.integer(year))
gap_longer %>% filter(year == max(year)) 
gap_longer %>% filter(year == max(year)) %>% count(country)
gap_longer %>% filter(year == max(year)) %>% count(country) %>% filter(n > 1)
gapminder %>% group_by(country, continent) %>% count()
gap_longer <- left_join(x = gap_longer, 
             y = gapminder %>% 
               group_by(country, continent) %>% 
               count() %>% 
               select(country, continent) ,
             by =  "country") 

gap_longer %>% head()
dim(gap_longer)
[1] 11460     4
gap_longer$continent %>% levels()
[1] "Africa"   "Americas" "Asia"     "Europe"   "Oceania" 
gap_longer %>% filter(is.na(continent)) %>% select(country) %>% unique() %>%  head()
fill_continents_df <- data.frame(
  
  country = c("Andorra", "Antigua and Barbuda", "Armenia",              
              "Azerbaijan", "Bahamas", "Barbados", "Belarus", 
              "Belize", "Bhutan",   "Brunei"),

  continent = c("Europe", "Americas", "Europe", "Europe", "Americas", 
                "Americas", "Europe", "Americas", "Asia", "Asia")
)

fill_continents_df
NA
top_30 <- gap_longer %>% 
  filter(!is.na(continent), year %in% c(2019)) %>% 
  top_n(n = 30, wt = gdpPercap) %>% 
  arrange(gdpPercap)

top_30 %>%  head()

1.6.1 Publish ready bar plots

Plot from: http://www.sthda.com/english/articles/24-ggpubr-publication-ready-plots/

ggbarplot(top_30, x = "country", y = "gdpPercap", fill = "continent",
          color = "white",
          palette = "jco", 
          sort.val = "desc", 
          sort.by.groups = F, 
          x.text.angle = 90)

ggbarplot(top_30, x = "country", y = "gdpPercap", fill = "continent",
          color = "white",
          palette = "jco", 
          sort.val = "asc", 
          sort.by.groups = T, 
          x.text.angle = 90)

1.6.2 Publish ready lollypop plots

ggdotchart(top_30, x = "country", y = "gdpPercap",
          color = "continent",
          palette = "jco", 
          sort.val = "desc", 
          sort.by.groups = T, 
          add = "segments",
          rotate = TRUE,
          group = "continent",
          dot.size = 6,
          label = top_30$gdpPercap,
          font.label = list(color = "black", size = 12, vjust = 0.5, hjust = -1),
          ggtheme = theme_pubr()
          )

ggdotchart(top_30, x = "country", y = "gdpPercap",
          color = "continent",
          palette = "jco", 
          sorting = "desc", 
          sort.by.groups = T, 
          add = "segments",
          rotate = TRUE,
          group = "continent",
          dot.size = 9,
          label = top_30$gdpPercap,
          font.label = list(color = "black", size = 12, vjust = 0.5, hjust = -1),
          ggtheme = theme_pubr()
          )

from:

https://rpkgs.datanovia.com/ggpubr/reference/ggdotchart.html http://www.sthda.com/english/articles/24-ggpubr-publication-ready-plots/

ggdotchart(top_30, x = "country", y = "gdpPercap",
          color = "continent",
          palette = "jco", 
          sorting = "desc", 
          sort.by.groups = T, 
          add = "segments",
          # rotate = TRUE,
          group = "continent",
          dot.size = 9,
          label = top_30$gdpPercap,
          font.label = list(color = "black", size = 12, vjust = 0.5, hjust = -1),
          ggtheme = theme_pubr(),
          # x.text.col = TRUE
          )

2 Highlight Plots

library(gghighlight)
ggplot(data = gap_longer) +
  geom_line(col = "grey", aes(x = year, y = gdpPercap, group = country)) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank()
          ) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5))

ggplot(data = gap_longer) +
  geom_line(col = "grey", aes(x = year, y = gdpPercap, group = country)) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank()
          ) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_log10() 

gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway","Denmark") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, group = country, col = highlight_type)) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank()
          ) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_log10() +
  scale_colour_manual(values = c("grey", "black")) +
  scale_size_manual(values = c(.5, 7))

gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, group = country, col = country)) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank()
          ) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_log10() + 
  gghighlight(highlight_type == "Yes") +
  labs(title = "GDP/Capita (Income / Person) in $ of Countries wrt to time",
       caption = "Data Source: Gapminder",
       y = "Log of Income (GDP / Capita)" 
       )

2.0.1 Log scale

gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_log10(labels = scales::comma) + 
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(),
        plot.title = element_text(hjust = 0.5),
        plot.subtitle = element_text(hjust = 0.5, colour = "maroon")
          ) +
  labs(title = "Income(Log of GDP/Capita in $) of world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Log of Income (GDP / Capita) i.e Multiplier scale" 
       )

ggsave(filename = "gdpPerCap_log_highlighted_chi.jpg", dpi = 300, height = 8, width = 10)

2.0.2 Facet Log scale

gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_log10(labels = scales::comma) + 
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  facet_wrap(~continent) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(),
        plot.title = element_text(hjust = 0.5),
        plot.subtitle = element_text(hjust = 0.5, colour = "maroon")
          ) +
  labs(title = "Income(Log of GDP/Capita in $) of world countries based on continents across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Log of Income (GDP / Capita) i.e Multiplier scale" 
       )

ggsave(filename = "gdpPerCap_log_highlighted_facet_chi.jpg", dpi = 300, height = 8, width = 10)

2.0.3 Normal scale

gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_continuous(labels = scales::comma, 
                     breaks = seq(from = 0, to = 200000, by = 25000)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(),
        plot.title = element_text(hjust = 0.5),
        plot.subtitle = element_text(hjust = 0.5, colour = "maroon")
          ) +
  labs(title = "Income(GDP/Capita in $) of world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Income (GDP / Capita) in $" 
       )

ggsave(filename = "gdpPerCap_norm_highlighted_chi.jpg", dpi = 300, height = 8, width = 10)

2.0.4 Facet Normal scale

gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_continuous(labels = scales::comma, 
                     breaks = seq(from = 0, to = 200000, by = 25000)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  facet_wrap(~continent) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(),
        plot.title = element_text(hjust = 0.5),
        plot.subtitle = element_text(hjust = 0.5, colour = "maroon")
          ) +
  labs(title = "Income(GDP/Capita in $) of world countries based on continents across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Income (GDP / Capita) in $" 
       )

ggsave(filename = "gdpPerCap_norm_highlighted_facet_chi.jpg", dpi = 300, height = 8, width = 10)

2.1 Applying theme_viny_bright

2.1.1 Log scale

gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_log10(labels = scales::comma) + 
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("pink", 0.4))) +
  theme_viny_bright() +
  theme(axis.text.x = element_text(angle = 90)
          ) +
  labs(title = "Income(Log of GDP/Capita in $) of world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Log of Income (GDP / Capita) i.e Multiplier scale" 
       )

ggsave(filename = "gdpPerCap_log_highlighted_pink.jpg", dpi = 300, height = 8, width = 10)

2.1.2 Facet Log scale

gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_log10(labels = scales::comma) + 
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("pink", 0.4))) +
  facet_wrap(~continent) +
  theme_viny_bright() +
  theme(axis.text.x = element_text(angle = 90)
          ) +
  labs(title = "Income(Log of GDP/Capita in $) of world countries based on continents across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Log of Income (GDP / Capita) i.e Multiplier scale" 
       )

ggsave(filename = "gdpPerCap_log_highlighted_facet_pink.jpg", dpi = 300, height = 8, width = 10)

2.1.3 Normal scale

gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_continuous(labels = scales::comma, 
                     breaks = seq(from = 0, to = 200000, by = 25000)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("pink", 0.4))) +
  theme_viny_bright() +
  theme(axis.text.x = element_text(angle = 90)
          ) +
  labs(title = "Income(GDP/Capita in $) of world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Income (GDP / Capita) in $" 
       )

ggsave(filename = "gdpPerCap_norm_highlighted_pink.jpg", dpi = 300, height = 8, width = 10)

2.1.4 Facet Normal scale

gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_continuous(labels = scales::comma, 
                     breaks = seq(from = 0, to = 200000, by = 25000)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("pink", 0.4))) +
  facet_wrap(~continent) +
  theme_viny_bright() +
  theme(axis.text.x = element_text(angle = 90)
          ) +
  labs(title = "Income(GDP/Capita in $) of world countries based on continents across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Income (GDP / Capita) in $" 
       )

ggsave(filename = "gdpPerCap_norm_highlighted_facet_pink.jpg", dpi = 300, height = 8, width = 10)

2.2 Loading tax data

2.2.1 Data source:

https://ourworldindata.org/taxation

tax_rev_to_gdp <- read_csv("E:/3. R/ourworldindata.org/total-tax-revenues-gdp.csv")

head(tax_rev_to_gdp)
tax_rev_to_gdp <- tax_rev_to_gdp %>% 
  rename("tax_revnue_perc_of_gdp" = "Total tax revenue (% of GDP) (ICTD (2019))",
         "country" = "Entity",
         "year" = "Year")

head(tax_rev_to_gdp)

Adding continent

tax_rev <- left_join(x = tax_rev_to_gdp,
          y = gapminder %>% 
            group_by(country, continent) %>% 
            count() %>% 
            select(country, continent),
          by = "country"
            )

summary(tax_rev)
   country              Code                year      tax_revnue_perc_of_gdp    continent   
 Length:5318        Length:5318        Min.   :1980   Min.   : 0.08581       Africa  :1309  
 Class :character   Class :character   1st Qu.:1993   1st Qu.:11.63091       Americas: 722  
 Mode  :character   Mode  :character   Median :2002   Median :18.01959       Asia    : 749  
                                       Mean   :2001   Mean   :20.05868       Europe  : 926  
                                       3rd Qu.:2009   3rd Qu.:27.63104       Oceania :  75  
                                       Max.   :2017   Max.   :56.91614       NA's    :1537  
attach(tax_rev)
tax_rev %>% 
  mutate(highlight_type = case_when(country %in%
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>%
ggplot() +
  geom_line(aes(x = year, y = round(tax_revnue_perc_of_gdp,2), col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1980, to = 2020, by = 5)) +
  scale_y_continuous(#labels = scales::percent,
                     breaks = seq(from = 0, to = 40, by = 5)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  # facet_wrap(~continent) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(),
        plot.title = element_text(hjust = 0.5),
        plot.subtitle = element_text(hjust = 0.5, colour = "maroon")
          ) +
  labs(title = "Total Tax Revenue earned % of GDP for world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Total Tax Revenue % of GDP" 
       )

tax_rev %>% 
  mutate(highlight_type = case_when(country %in%
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>%
ggplot() +
  geom_line(aes(x = year, y = round(tax_revnue_perc_of_gdp,2), col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1980, to = 2020, by = 5)) +
  scale_y_continuous(labels = label_dollar(prefix = "", suffix = " %"),
                     breaks = seq(from = 0, to = 40, by = 5)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  facet_wrap(~continent) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(),
        plot.title = element_text(hjust = 0.5),
        plot.subtitle = element_text(hjust = 0.5, colour = "maroon")
          ) +
  labs(title = "Total Tax Revenue earned % of GDP for world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Total Tax Revenue % of GDP" 
       )
Error in label_dollar(prefix = "", suffix = " %") : 
  could not find function "label_dollar"

2.2.2 Applying theme_viny_bright

library(scales)
tax_rev %>% 
  mutate(highlight_type = case_when(country %in%
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>%
ggplot() +
  geom_line(aes(x = year, y = round(tax_revnue_perc_of_gdp,2), col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1980, to = 2020, by = 5)) +
  scale_y_continuous(labels = label_dollar(prefix = "", suffix = " %"),
                     breaks = seq(from = 0, to = 60, by = 5)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("pink", 0.4))) +
  # facet_wrap(~continent) +
  theme_viny_bright() +
  theme(axis.text.x = element_text(angle = 90)
          ) +
  labs(title = "Total Tax Revenue earned % of GDP for world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Total Tax Revenue % of GDP" 
       )

tax_rev %>% 
  mutate(highlight_type = case_when(country %in%
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>%
ggplot() +
  geom_line(aes(x = year, y = round(tax_revnue_perc_of_gdp,2), col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1980, to = 2020, by = 5)) +
  scale_y_continuous(labels = label_dollar(prefix = "", suffix = " %"),
                     breaks = seq(from = 0, to = 60, by = 5)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("#ffaa33", 0.4))) +
  facet_wrap(~continent) +
  theme_viny_bright() +
  theme(axis.text.x = element_text(angle = 90)
          ) +
  labs(title = "Total Tax Revenue earned % of GDP for world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Total Tax Revenue % of GDP" 
       )

2.3 user defined function

udf_tax_rev_plot <- function(background_line_color = grey){
  
  background_line_color = enquo(background_line_color)

  tax_rev %>% 
    mutate(highlight_type = case_when(country %in%
                                   c("India","Singapore","Malaysia","Norway",
                                     "Denmark","United States","United Kingdom","China") ~ "Yes",
                                 TRUE ~ "No")) %>%
  ggplot() +
    geom_line(aes(x = year, y = round(tax_revnue_perc_of_gdp,2), col = country), size = 1.1) +
    scale_x_continuous(breaks = seq(from = 1980, to = 2020, by = 5)) +
    scale_y_continuous(labels = label_dollar(prefix = "", suffix = " %"),
                       breaks = seq(from = 0, to = 60, by = 5)) +
    gghighlight(highlight_type == "Yes",
                unhighlighted_params = list(size = 1, colour = alpha(background_line_color, 0.4))) +
    facet_wrap(~continent) +
    theme_viny_bright() +
    theme(axis.text.x = element_text(angle = 90)
            ) +
    labs(title = "Total Tax Revenue earned % of GDP for world countries across time",
         subtitle = "created by ViSa",
         caption = "Data Source: Gapminder",
         y = "Total Tax Revenue % of GDP" 
         )
}
udf_tax_rev_plot(pink)
Error: Unknown colour name: ~
udf_tax_rev_plot <- function(background_line_color = grey){
  
  background_line_color = enquo(background_line_color)
  
  print(as_label(background_line_color) )


}

udf_tax_rev_plot("#33ffff")  #33ffff
[1] "\"#33ffff\""
attach(gapminder)

country_highlight_plot <- function(df = gapminder, y_var = gdpPercap, 
                                   background_line_color = "grey", 
                                   countries = default_list 
                                   ){
  
  # default list of highlight countries
  default_list = c("India","Singapore","Malaysia","Norway",
                                     "Denmark","United States","United Kingdom","China")
  
  # quoting y-axis variable
  y_var = enquo(y_var)

  # Data Prep.
  df %>% 
    mutate(highlight_type = case_when(country %in% countries ~ "Yes",
                                      TRUE ~ "No")) %>%
  # Plotting  
  ggplot() +
    geom_line(aes(x = year, y = round(!!y_var,2), col = country), size = 1.1) +
    
    # scale_x_continuous(breaks = seq(from = 1980, to = 2020, by = 5)) +
    # scale_y_continuous(labels = label_dollar(prefix = "", suffix = " %"),
    #                    breaks = seq(from = 0, to = 60, by = 5)) +
    
    gghighlight(highlight_type == "Yes",
                unhighlighted_params = list(size = 1, colour = alpha(background_line_color, 0.4))) +
    # facet_wrap(~continent) +
    
    theme_viny_bright() +
    theme(axis.text.x = element_text(angle = 90)
            ) +
    
    labs(title = "GDP/Cap for world countries across time",
         subtitle = "created by ViSa",
         caption = "Data Source: Gapminder",
         y = "Total Tax Revenue % of GDP" 
         )
}

country_highlight_plot(df = gap_longer, countries = c("Australia","Singapore"), background_line_color = "pink")

2.4 ggcharts lib for dumbell plot

getting issues with this

library(ggcharts)
head(gapminder_new)
data("popeurope")
head(popeurope)
popeurope %>% 
  filter(country %in% c("India","Singapore","Malaysia","Norway",
                        "Denmark","United States","United Kingdom","China")) %>% 
  ggcharts::dumbbell_chart(x = country,
                           y1 = pop1952,
                           y2 = pop2007,
                           top_n = 10,
                           point_colors = c("lightgray","orange")
                            ) +
   scale_y_continuous(
    limits = c(0, NA),
    labels = function(x) paste(x, "Mn.")
  ) +
  theme_ng()

dumbbell_chart(
  data = popeurope,
  x = country,
  y1 = pop1952,
  y2 = pop2007,
  top_n = 10,
  point_colors = c("lightgray", "#494F5C")
) +
  labs(
    x = NULL,
    y = "Population",
    title = "Europe's Largest Countries by Population in 2007"
  ) +
  scale_y_continuous(
    limits = c(0, NA),
    labels = function(x) paste(x, "Mn.")
  )

gapminder_new %>% 
  select(country, "2010", "2019") %>% head() 

2.5 ggalt for dumbell plots

# devtools::install_github('bbc/bbplot')

library(ggalt)
library(bbplot)
gapminder_new %>% 
  select(country, "2010", "2019") %>% 
  mutate(gap = "2019" - "2010") %>% head() 
Error: Problem with `mutate()` input `gap`.
x non-numeric argument to binary operator
i Input `gap` is `"2019" - "2010"`.
Run `rlang::last_error()` to see where the error occurred.
gapminder %>%
  filter(year == 1967 | year == 2007) %>%
  select(country, year, lifeExp) %>%
  spread(year, lifeExp) %>%
  mutate(gap = `2007` - `1967`) %>%
  arrange(desc(gap)) %>%
  head(10)
gapminder_new %>% 
  filter(country %in% c("India","Singapore","Malaysia","Norway",
                        "Denmark","United States","United Kingdom","China")) %>% 
  select(country, "2010", "2019") %>% 
  mutate(gap = .[["2019"]] - .[["2010"]]) %>%
  arrange(desc(gap)) %>%
  
  ggplot(aes(x = .[["2010"]], xend = .[["2019"]], 
         y = reorder(country, gap), group = country)) +
  geom_dumbbell(colour = "#dddddd", size = 2,
                colour_x = "grey", colour_xend = "#FAAB18") +
  bbc_style()

gapminder_new %>% 
  filter(country %in% c("India","Singapore","Malaysia","Norway",
                        "Denmark","United States","United Kingdom","China")) %>% 
  select(country, "1970", "2019") %>% 
  mutate(gap = .[["2019"]] - .[["1970"]]) %>% 
  arrange(desc(gap)) %>%

  ggplot(aes(x = .[["1970"]], xend = .[["2019"]],
         y = reorder(country, gap), group = country)) +
  geom_dumbbell(colour = "#dddddd", size = 2,
                colour_x = "grey", colour_xend = "#FAAB18") +
  bbc_style()

head(gap_longer)
gap_longer %>%
  group_by(continent) %>% 
  filter(country == top_n(x=.,n=5,wt=gdpPercap) %>% select(country))
Error: Problem with `filter()` input `..1`.
x Input `..1` must be of size 2940 or 1, not size 30.
i Input `..1` is `country == top_n(x = ., n = 5, wt = gdpPercap) %>% select(country)`.
i The error occurred in group 1: continent = "Africa".
Run `rlang::last_error()` to see where the error occurred.

Below code gives top 5 countries by gdpPercap across the years

Overall_top5 <- gap_longer %>% 
  group_by(continent, country) %>% 
  summarise(gdpPercap = max(gdpPercap, na.rm = T)) %>% 
  top_n(n = 5, wt = gdpPercap) %>% 
  ungroup()

Overall_top5

Below code gives top 5 countries by gdpPercap of each continent across the years

gap_longer %>% 
  filter(
         country %in% (Overall_top5 %>% pull(country))) %>% 
  ggplot(aes(x = year, y = gdpPercap, color = country)) +
  geom_line() +
  facet_wrap(~continent) +
  theme_viny_bright() +
  theme(legend.position = "none",
        axis.text.x = element_text(angle = 90))

Overall_top5 %>% select(country)
gap_longer %>% 
  filter(year == 2019,
         country %in% (Overall_top5 %>% pull(country)))
gap_longer %>% 
  filter(year == 2019,
         country %in% Overall_top5$country ) 
NA
gap_longer %>% 
  filter(
    year == 2019,
    country %in% (Overall_top5 %>% pull(country))
  )
gap_longer %>% 
    filter(year == 2019, country %in% Overall_top5) 
gap_longer %>% 
    filter(year == 2019, country %in% Overall_top5) %>% 
    pull(country)
character(0)
gap_longer %>% 
    filter(year == 2019, country %in% Overall_top5$country) %>% 
    select(country)
top5_by_continents <- gap_longer %>% 
    filter(year == 2019, country %in% Overall_top5$country) %>% 
    pull(country)

top5_by_continents
 [1] "Australia"            "Botswana"             "Canada"               "Chile"               
 [5] "Denmark"              "Equatorial Guinea"    "Gabon"                "Ireland"             
 [9] "Israel"               "Japan"                "Kuwait"               "Libya"               
[13] "Liechtenstein"        "Luxembourg"           "Mauritius"            "Monaco"              
[17] "New Zealand"          "Norway"               "San Marino"           "Saudi Arabia"        
[21] "Singapore"            "Sweden"               "Switzerland"          "Trinidad and Tobago" 
[25] "United Arab Emirates" "United States"        "Venezuela"           
gap_longer %>% 
  mutate(highlight_type = case_when(country %in% top5_by_continents ~ "Yes",
                                                 TRUE ~ "No"))  %>% 
  #filter(!is.na(continent)) %>% filter(!is.na(gdpPercap)) %>% #head()
  na.exclude %>% 
  ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  gghighlight(highlight_type == "Yes", 
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  facet_wrap(~continent) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 60),
        legend.position = "none")

tax_rev %>% 
  mutate(highlight_type = case_when(country %in%
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>%
  ggplot() +
  geom_line(aes(x = year, y = tax_revnue_perc_of_gdp, col = as.factor(country)), size = 1.1) +
  gghighlight(highlight_type == "Yes", 
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  facet_wrap(~continent) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 60),
        legend.position = "none")

gap_longer %>% 
  mutate(highlight_type = case_when(country %in% top5_by_continents ~ "Yes",
                                                 TRUE ~ "No"))  %>% 
  #filter(!is.na(continent)) %>% filter(!is.na(gdpPercap)) %>% #head()
  na.exclude %>% summary()
   country               year        gdpPercap        continent    highlight_type    
 Length:6700        Min.   :1960   Min.   :  132   Africa  :2473   Length:6700       
 Class :character   1st Qu.:1978   1st Qu.:  910   Americas:1403   Class :character  
 Mode  :character   Median :1993   Median : 3135   Asia    :1318   Mode  :character  
                    Mean   :1992   Mean   : 9938   Europe  :1396                     
                    3rd Qu.:2006   3rd Qu.:12400   Oceania : 110                     
                    Max.   :2019   Max.   :92600                                     
tax_rev %>% 
  mutate(highlight_type = case_when(country %in%
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>%
  summary()
   country              Code                year      tax_revnue_perc_of_gdp    continent   
 Length:5318        Length:5318        Min.   :1980   Min.   : 0.08581       Africa  :1309  
 Class :character   Class :character   1st Qu.:1993   1st Qu.:11.63091       Americas: 722  
 Mode  :character   Mode  :character   Median :2002   Median :18.01959       Asia    : 749  
                                       Mean   :2001   Mean   :20.05868       Europe  : 926  
                                       3rd Qu.:2009   3rd Qu.:27.63104       Oceania :  75  
                                       Max.   :2017   Max.   :56.91614       NA's    :1537  
 highlight_type    
 Length:5318       
 Class :character  
 Mode  :character  
                   
                   
                   

3 plotly highlight charts

from:

https://stackoverflow.com/questions/64385240/is-there-a-way-to-have-a-highlighted-chart-as-well-as-have-interactivity-of-sele?noredirect=1#comment113856801_64385240

https://plotly-r.com/client-side-linking.html#filter

library(plotly)
# from ggplot2 library

data("txhousing")
txhousing %>% glimpse()
Rows: 8,602
Columns: 9
$ city      <chr> "Abilene", "Abilene", "Abilene", "Abilene", "Abilene", "Abilene", "Abilene", "Abil...
$ year      <int> 2000, 2000, 2000, 2000, 2000, 2000, 2000, 2000, 2000, 2000, 2000, 2000, 2001, 2001...
$ month     <int> 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 1, 2...
$ sales     <dbl> 72, 98, 130, 98, 141, 156, 152, 131, 104, 101, 100, 92, 75, 112, 118, 105, 150, 13...
$ volume    <dbl> 5380000, 6505000, 9285000, 9730000, 10590000, 13910000, 12635000, 10710000, 761500...
$ median    <dbl> 71400, 58700, 58100, 68600, 67300, 66900, 73500, 75000, 64500, 59300, 70900, 65000...
$ listings  <dbl> 701, 746, 784, 785, 794, 780, 742, 765, 771, 764, 721, 658, 779, 700, 738, 810, 77...
$ inventory <dbl> 6.3, 6.6, 6.8, 6.9, 6.8, 6.6, 6.2, 6.4, 6.5, 6.6, 6.2, 5.7, 6.8, 6.0, 6.4, 7.0, 6....
$ date      <dbl> 2000.000, 2000.083, 2000.167, 2000.250, 2000.333, 2000.417, 2000.500, 2000.583, 20...
txhousing %>%  head()
tx <- highlight_key(txhousing, ~city)
base <- plot_ly(tx, color = I("grey")) %>% 
  group_by(city)
time_series <- base %>% 
                  group_by(city) %>% 
                  add_lines(x = ~date, y = ~median)
highlight(
  time_series,
  on = "plotly_hover",
  selectize = FALSE,
  dynamic = FALSE,
  color = "red",
  persistent = FALSE
)
Error in dirname(to) : path too long
plotly_1 <- gap_longer %>% 
  filter(continent == "Asia") %>% 
  na.exclude() %>% 
  
  plotly::highlight_key(., ~country)
base <- plot_ly(plotly_1, color = I("grey")) %>% 
  group_by(country)
time_series <- base %>% 
              group_by(country) %>% 
              add_lines(x = ~year, y = ~gdpPercap)
highlight(
  time_series,
  on = "plotly_hover",
  selectize = FALSE,
  dynamic = FALSE,
  color = "red",
  persistent = FALSE
)
Error in dirname(to) : path too long
plotly_1 <- gap_longer %>% 
  filter(continent == "Asia", gdpPercap < max(20000)) %>% 
  na.exclude() %>% 
  
  plotly::highlight_key(., ~country)
base <- plot_ly(plotly_1, color = I("grey")) %>% 
  group_by(country)
tme_series <- base %>% 
              group_by(country) %>% 
              add_lines(x = ~year, y = ~gdpPercap)
highlight(
  time_series,
  on = "plotly_click",
  selectize = TRUE,
  dynamic = TRUE,
  color = "red",
  persistent = TRUE
)
Error in dirname(to) : path too long
hist <- add_histogram(
  base,
  x = ~gdpPercap,
  histnorm = "probability density"
)

subplot(time_series, hist, nrows = 2) %>% 
  layout(barmode = "overlay", showlegend = FALSE) %>% 
  highlight(
    dynamic = TRUE,
    selectize = TRUE,
    color = "red",
    selected = attrs_selected(opacity = 0.3)
  )
Error in dirname(to) : path too long

3.0.1 Trying to subtract row wise

gapminder_new %>% 
  filter(country == c("India","Bangladesh"))

3.0.1.1 failed attempts

gapminder_new %>% 
  filter(country == c("India","Bangladesh")) %>% 
  .[["India",]] - .[["Bangladesh",]]
Error: Subscript can't be missing for tibbles in `[[`.
Run `rlang::last_error()` to see where the error occurred.
gapminder_new %>% 
  filter(country == c("India","Bangladesh")) %>% 
  .["India",] - .["Bangladesh",]
Error: object '.' not found
gapminder_new %>% 
  filter(country == c("India","Bangladesh")) %>% 
  .[country == "India",] - .[country == "Bangladesh",]
Error: Must subset rows with a valid subscript vector.
i Logical subscripts must match the size of the indexed input.
x Input has size 2 but subscript `country == "India"` has size 1704.
Run `rlang::last_error()` to see where the error occurred.
gapminder_new %>% 
  filter(country == c("India","Bangladesh")) %>% 
  .[India,] - .[Bangladesh,]
Error in `[.tbl_df`(., India, ) : object 'India' not found
gapminder_new %>% 
  filter(country == c("India","Bangladesh")) %>% 
  .[[India,]] - .[[Bangladesh,]]
Error: Subscript can't be missing for tibbles in `[[`.
Run `rlang::last_error()` to see where the error occurred.
gapminder_new %>% 
  filter(country == c("India","Bangladesh")) %>% 
  mutate(Diff_result = (. %>% filter(country == "India") ) - (. %>% filter(country == "Bangladesh"))  )
Error: Problem with `mutate()` input `Diff_result`.
x non-numeric argument to binary operator
i Input `Diff_result` is `-...`.
Run `rlang::last_error()` to see where the error occurred.
gapminder_new[country == "India",] - gapminder_new[country == "Bangladesh",]
Error: Must subset rows with a valid subscript vector.
i Logical subscripts must match the size of the indexed input.
x Input has size 191 but subscript `country == "India"` has size 1704.
Run `rlang::last_error()` to see where the error occurred.
gapminder_new[India,] - gapminder_new[Bangladesh,]
Error in `[.tbl_df`(gapminder_new, India, ) : object 'India' not found
gapminder_new %>% 
  filter(country == "India")
rownames(gapminder_new[country == "India",])
Error: Must subset rows with a valid subscript vector.
i Logical subscripts must match the size of the indexed input.
x Input has size 191 but subscript `country == "India"` has size 1704.
Run `rlang::last_error()` to see where the error occurred.
rownames(gapminder_new[country == India,])
Error in `[.tbl_df`(gapminder_new, country == India, ) : 
  object 'India' not found
gapminder_new[country == "India",]
Error: Must subset rows with a valid subscript vector.
i Logical subscripts must match the size of the indexed input.
x Input has size 191 but subscript `country == "India"` has size 1704.
Run `rlang::last_error()` to see where the error occurred.
gapminder_new
rownames(gapminder_new) <- gapminder_new$country
gapminder_new %>%  head()
gapminder_new["India", 2: ncol(gapminder_new)] #- gapminder_new["Bangladesh", ]
gapminder_new[, 2:ncol(gapminder_new)]

3.0.1.2 solution from stackoverflow

https://stackoverflow.com/questions/64410966/how-to-subtract-a-row-from-another-row-in-r

gapminder_new %>% 
  filter(country %in% c("India","Bangladesh")) %>% 
  select(-1) %>% 
  mutate(across(everything(), ~lead(.x) - (.x))) %>% na.omit()
gapminder_new %>% select(-1) %>% mutate(across(everything(), ~lead(.x) - (.x))) %>% na.omit()
gapminder_new %>% 
  filter(country %in% c("India","Bangladesh"))

3.0.1.3 My own solution

test_set <- as.data.frame(gapminder_new)

rownames(test_set) <- test_set$country

head(test_set)
test_set %>%  select(-country)

test_set["India",2:ncol(test_set)] - test_set["Bangladesh",2:ncol(test_set)]

3.0.2 setting toolips / highcharter

from: https://jkunst.com/blog/posts/2019-02-04-using-tooltips-in-unexpected-ways/

library(highcharter)

3.0.2.1 Series chart

gp <- gapminder %>% 
  arrange(desc(year)) %>% 
  distinct(country, .keep_all = TRUE)

head(gp)
gp2 <- gapminder %>% 
  select(country, year, pop) %>% 
  nest(-country) %>% 
  mutate(
    data = map(data, mutate_mapping, hcaes(x = year, y = pop), drop = TRUE),
    data = map(data, list_parse)
  ) %>% 
  rename(ttdata = data)

gp2
gptot <- left_join(gp, gp2, by = "country")

head(gptot)
hchart(
  gptot,
  "point",
  hcaes(x = lifeExp, y = gdpPercap, name = country, 
        size=pop, group=continent, name=country)
) %>% 
  
  hc_yAxis(type = "logarithmic") %>% 
  
  # this is what creates a chart in tooltip
  hc_tooltip(
    useHTML = TRUE,
    headerFormat = "<b>{point.key}</b>",
    pointFormatter = tooltip_chart(accesor = "ttdata")
  ) %>% 
  
  hc_title(text = "Tooltip chart within a Chart") %>% 
  hc_subtitle(text = "(ttchart: population growth)")
3.0.2.1.1 log
gp2_log <- gapminder %>% 
  select(country, year, pop) %>% 
  nest(-country) %>% 
  mutate(
    data = map(data, mutate_mapping, hcaes(x = year, y = log(pop)), drop = TRUE),
    data = map(data, list_parse)
  ) %>% 
  rename(ttdata_log = data)

gp2_log
gptot_log <- left_join(gp, gp2_log, by = "country")

head(gptot_log)
hchart(
  gptot_log,
  "point",
  hcaes(x = lifeExp, y = gdpPercap, name = country, 
        size=pop, group=continent, name=country)
) %>% 
  
  hc_yAxis(type = "logarithmic") %>% 
  
  # this is what creates a chart in tooltip
  hc_tooltip(
    useHTML = TRUE,
    headerFormat = "<b>{point.key}</b>",
    pointFormatter = tooltip_chart(accesor = "ttdata_log")
  ) %>% 
  
  hc_title(text = "Tooltip chart within a Chart") %>% 
  hc_subtitle(text = "(ttchart: log population growth)")

3.0.2.2 donut chart

from: https://jkunst.com/blog/posts/2019-02-04-using-tooltips-in-unexpected-ways/

donutdata <- gp %>% 
  group_by(continent) %>% 
  summarise(pop = sum(pop/1e6) * 1e6)

donutdata
hchart(donutdata, "pie",
       hcaes(name = continent, y = pop), innerSize = 300)
hc <- hchart(
  donutdata2, "pie", hcaes(name = continent, y = pop),
  innerSize = 375
)

hc
hc %>% 
  hc_tooltip(
    useHTML = TRUE,
    headerFormat = "<b>{point.key}</b>",
    pointFormatter = tooltip_chart(
      accesor = "ttdata",
      hc_opts = list(
        chart = list(type = "scatter"),
        credits = list(enabled = FALSE),
        plotOptions = list(scatter = list(marker = list(radius = 2)))
        ),
      height = 225
      ),
    positioner = JS(
      "function () {
      
        /* one of the most important parts! */
        xp =  this.chart.chartWidth/2 - this.label.width/2
        yp =  this.chart.chartHeight/2 - this.label.height/2
      
        return { x: xp, y: yp };
      
      }"),
    shadow = FALSE,
    borderWidth = 0,
    backgroundColor = "transparent",
    hideDelay = 1000
  )
---
title: "ggpubr, gapminder, tax highlight plots"
output: 
  html_notebook:
    highlight: tango
    df_print: paged
    toc: true
    toc_float: 
      collapsed: false
      smooth_scroll: false
    number_sections: true
    toc_depth: 6
---


# ggpubr

## options & settings

For scrollable output

```{css, echo=FALSE}
.scroll-100 {
  max-height: 100px;
  overflow-y: auto;
  background-color: inherited;
}


h1, #TOC>ul>li {
  color: #B64D3A;
}

h2, #TOC>ul>ul>li {
  color: #000000;
}

h3, #TOC>ul>ul>ul>li {
  color: #643cb2;
}

h4, #TOC>ul>ul>ul>ul>li {
  color: #ae0058;
}

h5, #TOC>ul>ul>ul>ul>ul>li {
  color: #ffa447;
}

h6, #TOC>ul>ul>ul>ul>ul>ul>li {
  color: #DAE3D9;
}


```


```{r setup, include=FALSE}
knitr::opts_chunk$set(echo = TRUE, message = FALSE, warning = FALSE, dpi = 300, out.width = "100%",attr.output='style="max-height: 300px;"')
```


```{r}
options(scipen = 999)
```

## Source

http://www.sthda.com/english/articles/24-ggpubr-publication-ready-plots/
https://youtu.be/NJquUKavAOI
https://youtu.be/UvRaNJC05Ec


## Loading libs

```{r}
# install.packages("gapminder")
```


```{r}
library(tidyverse)
library(ggpubr)
library(gapminder)
```

## creating theme_viny_bright

```{r}
theme_viny_bright <- function(){
  
  library(ggthemes)
  
  ggthemes::theme_fivethirtyeight() %+replace%
  
  theme(
    axis.title = element_text(),
    
    axis.text = element_text(size = 13),
    
    legend.text = element_text(size = 10),
    
    panel.background = element_rect(fill = "white"),
    
    plot.background = element_rect(fill = "white"),
    
    strip.background = element_blank(),
    
    legend.background = element_rect(fill = NA),
    
    legend.key = element_rect(fill = NA),

    plot.title = element_text(hjust = 0.5,
                              size = 19,
                              face = "bold"),
    plot.subtitle = element_text(hjust = 0.5, colour = "maroon")
      )
  
  }
```


## Loading gapminder lib data

```{r}
gapminder %>% head()
```


```{r}
gapminder %>% glimpse()
```

```{r}
attach(gapminder)
```


### Boxplot within Violin & more 

```{r}
violin_plot1 <- gapminder %>% filter(year == max(year)) %>% 
  
  ggpubr::ggviolin(., x = "continent", y = "gdpPercap", 
                   fill = "continent", color = "continent", 
                   add = "boxplot", add.params = list(fill = "white", shape = "continent"))

set_palette(violin_plot1, palette = "jco")
```


```{r}
violin_plot2 <- gapminder %>% filter(year == max(year)) %>% 
  
  ggpubr::ggviolin(., x = "continent", y = "gdpPercap", 
                   color = "continent", 
                   add = "point")

set_palette(violin_plot2, palette = "jco")
```


```{r}
violin_plot3 <- gapminder %>% filter(year == max(year)) %>% 
  
  ggpubr::ggviolin(., x = "continent", y = "gdpPercap", 
                   color = "continent", 
                   add = "point")

set_palette(violin_plot3, palette = "jco")
```



```{r}
violin_plot4 <- gapminder %>% filter(year == max(year)) %>% 
  
  ggpubr::ggviolin(., x = "continent", y = "gdpPercap", 
                   color = "continent", 
                   add = "jitter")

set_palette(violin_plot4, palette = "jco")
```

## Loading latest gapminder data

```{r}
gapminder_new <- read_csv("E:/3. R/gapminder data/income - gdppercap/gdppercapita_us_inflation_adjusted.csv")

head(gapminder_new)
```


```{r}
dim(gapminder_new)
```


```{r}
gapminder_new %>% select(country,"2010","2014","2017","2019") %>% head()
```

```{r}
gap_longer <- gapminder_new %>% 
  pivot_longer(cols = !country, names_to = "year", values_to = "gdpPercap") 

gap_longer %>% head()
```

```{r}
dim(gap_longer)
```

```{r}
gap_longer <- gap_longer %>% mutate(year = as.integer(year))
```



```{r}
gap_longer %>% filter(year == max(year)) 
```


```{r}
gap_longer %>% filter(year == max(year)) %>% count(country)
```


```{r}
gap_longer %>% filter(year == max(year)) %>% count(country) %>% filter(n > 1)
```

```{r}
gapminder %>% group_by(country, continent) %>% count()
```



```{r}
gap_longer <- left_join(x = gap_longer, 
             y = gapminder %>% 
               group_by(country, continent) %>% 
               count() %>% 
               select(country, continent) ,
             by =  "country") 

gap_longer %>% head()
```



```{r}
dim(gap_longer)
```


```{r}
gap_longer$continent %>% levels()
```


```{r}
gap_longer %>% filter(is.na(continent)) %>% select(country) %>% unique() %>%  head()
```

```{r}
fill_continents_df <- data.frame(
  
  country = c("Andorra", "Antigua and Barbuda", "Armenia", 				
              "Azerbaijan",	"Bahamas", "Barbados", "Belarus", 
              "Belize", "Bhutan",	"Brunei"),

  continent = c("Europe", "Americas", "Europe", "Europe", "Americas", 
                "Americas", "Europe", "Americas", "Asia", "Asia")
)

fill_continents_df

```



```{r}
top_30 <- gap_longer %>% 
  filter(!is.na(continent), year %in% c(2019)) %>% 
  top_n(n = 30, wt = gdpPercap) %>% 
  arrange(gdpPercap)

top_30 %>%  head()
```

### Publish ready bar plots

Plot from: http://www.sthda.com/english/articles/24-ggpubr-publication-ready-plots/


```{r}
ggbarplot(top_30, x = "country", y = "gdpPercap", fill = "continent",
          color = "white",
          palette = "jco", 
          sort.val = "desc", 
          sort.by.groups = F, 
          x.text.angle = 90)
```

```{r}
ggbarplot(top_30, x = "country", y = "gdpPercap", fill = "continent",
          color = "white",
          palette = "jco", 
          sort.val = "asc", 
          sort.by.groups = T, 
          x.text.angle = 90)
```

### Publish ready lollypop plots

```{r fig.height=9}
ggdotchart(top_30, x = "country", y = "gdpPercap",
          color = "continent",
          palette = "jco", 
          sort.val = "desc", 
          sort.by.groups = T, 
          add = "segments",
          rotate = TRUE,
          group = "continent",
          dot.size = 6,
          label = top_30$gdpPercap,
          font.label = list(color = "black", size = 12, vjust = 0.5, hjust = -1),
          ggtheme = theme_pubr()
          )
```


```{r fig.height=9}
ggdotchart(top_30, x = "country", y = "gdpPercap",
          color = "continent",
          palette = "jco", 
          sorting = "desc", 
          sort.by.groups = T, 
          add = "segments",
          rotate = TRUE,
          group = "continent",
          dot.size = 9,
          label = top_30$gdpPercap,
          font.label = list(color = "black", size = 12, vjust = 0.5, hjust = -1),
          ggtheme = theme_pubr()
          )
```

from: 

https://rpkgs.datanovia.com/ggpubr/reference/ggdotchart.html
http://www.sthda.com/english/articles/24-ggpubr-publication-ready-plots/

```{r fig.height=9}
ggdotchart(top_30, x = "country", y = "gdpPercap",
          color = "continent",
          palette = "jco", 
          sorting = "desc", 
          sort.by.groups = T, 
          add = "segments",
          # rotate = TRUE,
          group = "continent",
          dot.size = 9,
          label = top_30$gdpPercap,
          font.label = list(color = "black", size = 12, vjust = 0.5, hjust = -1),
          ggtheme = theme_pubr(),
          # x.text.col = TRUE
          )
```


# Highlight Plots

```{r}
library(gghighlight)
```


```{r}
ggplot(data = gap_longer) +
  geom_line(col = "grey", aes(x = year, y = gdpPercap, group = country)) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank()
          ) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5))
```


```{r}
ggplot(data = gap_longer) +
  geom_line(col = "grey", aes(x = year, y = gdpPercap, group = country)) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank()
          ) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_log10() 
```

```{r}
gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway","Denmark") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, group = country, col = highlight_type)) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank()
          ) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_log10() +
  scale_colour_manual(values = c("grey", "black")) +
  scale_size_manual(values = c(.5, 7))
```


```{r}
gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, group = country, col = country)) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank()
          ) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_log10() + 
  gghighlight(highlight_type == "Yes") +
  labs(title = "GDP/Capita (Income / Person) in $ of Countries wrt to time",
       caption = "Data Source: Gapminder",
       y = "Log of Income (GDP / Capita)" 
       )
```

### Log scale

```{r fig.width=10, fig.height=12}
gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_log10(labels = scales::comma) + 
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(),
        plot.title = element_text(hjust = 0.5),
        plot.subtitle = element_text(hjust = 0.5, colour = "maroon")
          ) +
  labs(title = "Income(Log of GDP/Capita in $) of world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Log of Income (GDP / Capita) i.e Multiplier scale" 
       )
```

```{r}
ggsave(filename = "gdpPerCap_log_highlighted_chi.jpg", dpi = 300, height = 8, width = 10)
```


### Facet Log scale

```{r fig.width=10, fig.height=10}
gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_log10(labels = scales::comma) + 
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  facet_wrap(~continent) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(),
        plot.title = element_text(hjust = 0.5),
        plot.subtitle = element_text(hjust = 0.5, colour = "maroon")
          ) +
  labs(title = "Income(Log of GDP/Capita in $) of world countries based on continents across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Log of Income (GDP / Capita) i.e Multiplier scale" 
       )
```

```{r}
ggsave(filename = "gdpPerCap_log_highlighted_facet_chi.jpg", dpi = 300, height = 8, width = 10)
```



### Normal scale

```{r fig.width=10, fig.height=10}
gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_continuous(labels = scales::comma, 
                     breaks = seq(from = 0, to = 200000, by = 25000)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(),
        plot.title = element_text(hjust = 0.5),
        plot.subtitle = element_text(hjust = 0.5, colour = "maroon")
          ) +
  labs(title = "Income(GDP/Capita in $) of world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Income (GDP / Capita) in $" 
       )
```


```{r}
ggsave(filename = "gdpPerCap_norm_highlighted_chi.jpg", dpi = 300, height = 8, width = 10)
```

### Facet Normal scale

```{r fig.width=10, fig.height=10}
gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_continuous(labels = scales::comma, 
                     breaks = seq(from = 0, to = 200000, by = 25000)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  facet_wrap(~continent) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(),
        plot.title = element_text(hjust = 0.5),
        plot.subtitle = element_text(hjust = 0.5, colour = "maroon")
          ) +
  labs(title = "Income(GDP/Capita in $) of world countries based on continents across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Income (GDP / Capita) in $" 
       )
```


```{r}
ggsave(filename = "gdpPerCap_norm_highlighted_facet_chi.jpg", dpi = 300, height = 8, width = 10)
```


## Applying theme_viny_bright


### Log scale

```{r fig.width=10, fig.height=12}
gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_log10(labels = scales::comma) + 
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("pink", 0.4))) +
  theme_viny_bright() +
  theme(axis.text.x = element_text(angle = 90)
          ) +
  labs(title = "Income(Log of GDP/Capita in $) of world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Log of Income (GDP / Capita) i.e Multiplier scale" 
       )
```


```{r}
ggsave(filename = "gdpPerCap_log_highlighted_pink.jpg", dpi = 300, height = 8, width = 10)
```


### Facet Log scale

```{r fig.width=10, fig.height=10}
gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_log10(labels = scales::comma) + 
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("pink", 0.4))) +
  facet_wrap(~continent) +
  theme_viny_bright() +
  theme(axis.text.x = element_text(angle = 90)
          ) +
  labs(title = "Income(Log of GDP/Capita in $) of world countries based on continents across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Log of Income (GDP / Capita) i.e Multiplier scale" 
       )
```

```{r}
ggsave(filename = "gdpPerCap_log_highlighted_facet_pink.jpg", dpi = 300, height = 8, width = 10)
```



### Normal scale

```{r fig.width=10, fig.height=10}
gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_continuous(labels = scales::comma, 
                     breaks = seq(from = 0, to = 200000, by = 25000)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("pink", 0.4))) +
  theme_viny_bright() +
  theme(axis.text.x = element_text(angle = 90)
          ) +
  labs(title = "Income(GDP/Capita in $) of world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Income (GDP / Capita) in $" 
       )
```


```{r}
ggsave(filename = "gdpPerCap_norm_highlighted_pink.jpg", dpi = 300, height = 8, width = 10)
```

### Facet Normal scale

```{r fig.width=10, fig.height=10}
gap_longer %>% 
  mutate(highlight_type = case_when(country %in% 
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>% 
ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1960, to = 2020, by = 5)) +
  scale_y_continuous(labels = scales::comma, 
                     breaks = seq(from = 0, to = 200000, by = 25000)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("pink", 0.4))) +
  facet_wrap(~continent) +
  theme_viny_bright() +
  theme(axis.text.x = element_text(angle = 90)
          ) +
  labs(title = "Income(GDP/Capita in $) of world countries based on continents across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Income (GDP / Capita) in $" 
       )
```


```{r}
ggsave(filename = "gdpPerCap_norm_highlighted_facet_pink.jpg", dpi = 300, height = 8, width = 10)
```



## Loading tax data

### Data source: 

https://ourworldindata.org/taxation


```{r}
tax_rev_to_gdp <- read_csv("E:/3. R/ourworldindata.org/total-tax-revenues-gdp.csv")

head(tax_rev_to_gdp)
```

```{r}
tax_rev_to_gdp <- tax_rev_to_gdp %>% 
  rename("tax_revnue_perc_of_gdp" = "Total tax revenue (% of GDP) (ICTD (2019))",
         "country" = "Entity",
         "year" = "Year")

head(tax_rev_to_gdp)
```

Adding continent

```{r}
tax_rev <- left_join(x = tax_rev_to_gdp,
          y = gapminder %>% 
            group_by(country, continent) %>% 
            count() %>% 
            select(country, continent),
          by = "country"
            )

summary(tax_rev)
```



```{r}
attach(tax_rev)
```


```{r fig.width=10, fig.height=10}
tax_rev %>% 
  mutate(highlight_type = case_when(country %in%
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>%
ggplot() +
  geom_line(aes(x = year, y = round(tax_revnue_perc_of_gdp,2), col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1980, to = 2020, by = 5)) +
  scale_y_continuous(#labels = scales::percent,
                     breaks = seq(from = 0, to = 40, by = 5)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  # facet_wrap(~continent) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(),
        plot.title = element_text(hjust = 0.5),
        plot.subtitle = element_text(hjust = 0.5, colour = "maroon")
          ) +
  labs(title = "Total Tax Revenue earned % of GDP for world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Total Tax Revenue % of GDP" 
       )
```


```{r fig.width=10, fig.height=10}
tax_rev %>% 
  mutate(highlight_type = case_when(country %in%
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>%
ggplot() +
  geom_line(aes(x = year, y = round(tax_revnue_perc_of_gdp,2), col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1980, to = 2020, by = 5)) +
  scale_y_continuous(labels = label_dollar(prefix = "", suffix = " %"),
                     breaks = seq(from = 0, to = 40, by = 5)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  facet_wrap(~continent) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 90),
        legend.position = "none",
        panel.grid.major = element_blank(),
        panel.grid.minor = element_blank(),
        plot.title = element_text(hjust = 0.5),
        plot.subtitle = element_text(hjust = 0.5, colour = "maroon")
          ) +
  labs(title = "Total Tax Revenue earned % of GDP for world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Total Tax Revenue % of GDP" 
       )
```

### Applying theme_viny_bright

```{r}
library(scales)
```


```{r fig.width=10, fig.height=10}
tax_rev %>% 
  mutate(highlight_type = case_when(country %in%
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>%
ggplot() +
  geom_line(aes(x = year, y = round(tax_revnue_perc_of_gdp,2), col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1980, to = 2020, by = 5)) +
  scale_y_continuous(labels = label_dollar(prefix = "", suffix = " %"),
                     breaks = seq(from = 0, to = 60, by = 5)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("pink", 0.4))) +
  # facet_wrap(~continent) +
  theme_viny_bright() +
  theme(axis.text.x = element_text(angle = 90)
          ) +
  labs(title = "Total Tax Revenue earned % of GDP for world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Total Tax Revenue % of GDP" 
       )
```


```{r fig.width=10, fig.height=10}
tax_rev %>% 
  mutate(highlight_type = case_when(country %in%
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>%
ggplot() +
  geom_line(aes(x = year, y = round(tax_revnue_perc_of_gdp,2), col = country), size = 1.1) +
  scale_x_continuous(breaks = seq(from = 1980, to = 2020, by = 5)) +
  scale_y_continuous(labels = label_dollar(prefix = "", suffix = " %"),
                     breaks = seq(from = 0, to = 60, by = 5)) +
  gghighlight(highlight_type == "Yes",
              unhighlighted_params = list(size = 1, colour = alpha("#ffaa33", 0.4))) +
  facet_wrap(~continent) +
  theme_viny_bright() +
  theme(axis.text.x = element_text(angle = 90)
          ) +
  labs(title = "Total Tax Revenue earned % of GDP for world countries across time",
       subtitle = "created by ViSa",
       caption = "Data Source: Gapminder",
       y = "Total Tax Revenue % of GDP" 
       )
```

## user defined function

```{r fig.width=10, fig.height=10}
udf_tax_rev_plot <- function(background_line_color = grey){
  
  background_line_color = enquo(background_line_color)

  tax_rev %>% 
    mutate(highlight_type = case_when(country %in%
                                   c("India","Singapore","Malaysia","Norway",
                                     "Denmark","United States","United Kingdom","China") ~ "Yes",
                                 TRUE ~ "No")) %>%
  ggplot() +
    geom_line(aes(x = year, y = round(tax_revnue_perc_of_gdp,2), col = country), size = 1.1) +
    scale_x_continuous(breaks = seq(from = 1980, to = 2020, by = 5)) +
    scale_y_continuous(labels = label_dollar(prefix = "", suffix = " %"),
                       breaks = seq(from = 0, to = 60, by = 5)) +
    gghighlight(highlight_type == "Yes",
                unhighlighted_params = list(size = 1, colour = alpha(background_line_color, 0.4))) +
    facet_wrap(~continent) +
    theme_viny_bright() +
    theme(axis.text.x = element_text(angle = 90)
            ) +
    labs(title = "Total Tax Revenue earned % of GDP for world countries across time",
         subtitle = "created by ViSa",
         caption = "Data Source: Gapminder",
         y = "Total Tax Revenue % of GDP" 
         )
}
```

```{r fig.height=10, fig.width=10}
udf_tax_rev_plot(pink)
```


```{r}
udf_tax_rev_plot <- function(background_line_color = grey){
  
  background_line_color = enquo(background_line_color)
  
  print(as_label(background_line_color) )


}

udf_tax_rev_plot("#33ffff")  #33ffff
```

```{r}
attach(gapminder)
```




```{r fig.height=10, fig.width=10}

country_highlight_plot <- function(df = gapminder, y_var = gdpPercap, 
                                   background_line_color = "grey", 
                                   countries = default_list 
                                   ){
  
  # default list of highlight countries
  default_list = c("India","Singapore","Malaysia","Norway",
                                     "Denmark","United States","United Kingdom","China")
  
  # quoting y-axis variable
  y_var = enquo(y_var)

  # Data Prep.
  df %>% 
    mutate(highlight_type = case_when(country %in% countries ~ "Yes",
                                      TRUE ~ "No")) %>%
  # Plotting  
  ggplot() +
    geom_line(aes(x = year, y = round(!!y_var,2), col = country), size = 1.1) +
    
    # scale_x_continuous(breaks = seq(from = 1980, to = 2020, by = 5)) +
    # scale_y_continuous(labels = label_dollar(prefix = "", suffix = " %"),
    #                    breaks = seq(from = 0, to = 60, by = 5)) +
    
    gghighlight(highlight_type == "Yes",
                unhighlighted_params = list(size = 1, colour = alpha(background_line_color, 0.4))) +
    # facet_wrap(~continent) +
    
    theme_viny_bright() +
    theme(axis.text.x = element_text(angle = 90)
            ) +
    
    labs(title = "GDP/Cap for world countries across time",
         subtitle = "created by ViSa",
         caption = "Data Source: Gapminder",
         y = "Total Tax Revenue % of GDP" 
         )
}

country_highlight_plot(df = gap_longer, countries = c("Australia","Singapore"), background_line_color = "pink")
```

## ggcharts lib for dumbell plot 

getting issues with this

```{r}
library(ggcharts)
```


```{r}
head(gapminder_new)
```



```{r}
data("popeurope")
```

```{r}
head(popeurope)
```

```{r}
popeurope %>% 
  filter(country %in% c("India","Singapore","Malaysia","Norway",
                        "Denmark","United States","United Kingdom","China")) %>% 
  ggcharts::dumbbell_chart(x = country,
                           y1 = pop1952,
                           y2 = pop2007,
                           top_n = 10,
                           point_colors = c("lightgray","orange")
                            ) +
   scale_y_continuous(
    limits = c(0, NA),
    labels = function(x) paste(x, "Mn.")
  ) +
  theme_ng()
```

```{r}
dumbbell_chart(
  data = popeurope,
  x = country,
  y1 = pop1952,
  y2 = pop2007,
  top_n = 10,
  point_colors = c("lightgray", "#494F5C")
) +
  labs(
    x = NULL,
    y = "Population",
    title = "Europe's Largest Countries by Population in 2007"
  ) +
  scale_y_continuous(
    limits = c(0, NA),
    labels = function(x) paste(x, "Mn.")
  )
```


```{r}
gapminder_new %>% 
  select(country, "2010", "2019") %>% head() 
```



## ggalt for dumbell plots

```{r}
# devtools::install_github('bbc/bbplot')

library(ggalt)
library(bbplot)
```


```{r}
gapminder_new %>% 
  select(country, "2010", "2019") %>% 
  mutate(gap = "2019" - "2010") %>% head() 
```

```{r}
gapminder %>%
  filter(year == 1967 | year == 2007) %>%
  select(country, year, lifeExp) %>%
  spread(year, lifeExp) %>%
  mutate(gap = `2007` - `1967`) %>%
  arrange(desc(gap)) %>%
  head(10)
```


```{r}
gapminder_new %>% 
  filter(country %in% c("India","Singapore","Malaysia","Norway",
                        "Denmark","United States","United Kingdom","China")) %>% 
  select(country, "2010", "2019") %>% 
  mutate(gap = .[["2019"]] - .[["2010"]]) %>%
  arrange(desc(gap)) %>%
  
  ggplot(aes(x = .[["2010"]], xend = .[["2019"]], 
         y = reorder(country, gap), group = country)) +
  geom_dumbbell(colour = "#dddddd", size = 2,
                colour_x = "grey", colour_xend = "#FAAB18") +
  bbc_style()
```

```{r}
gapminder_new %>% 
  filter(country %in% c("India","Singapore","Malaysia","Norway",
                        "Denmark","United States","United Kingdom","China")) %>% 
  select(country, "1970", "2019") %>% 
  mutate(gap = .[["2019"]] - .[["1970"]]) %>% 
  arrange(desc(gap)) %>%

  ggplot(aes(x = .[["1970"]], xend = .[["2019"]],
         y = reorder(country, gap), group = country)) +
  geom_dumbbell(colour = "#dddddd", size = 2,
                colour_x = "grey", colour_xend = "#FAAB18") +
  bbc_style()
```

```{r}
head(gap_longer)
```


```{r}
gap_longer %>%
  group_by(continent) %>% 
  filter(country == top_n(x=.,n=5,wt=gdpPercap) %>% select(country))
```

Below code gives top 5 countries by gdpPercap across the years 

```{r}
Overall_top5 <- gap_longer %>% 
  group_by(continent, country) %>% 
  summarise(gdpPercap = max(gdpPercap, na.rm = T)) %>% 
  top_n(n = 5, wt = gdpPercap) %>% 
  ungroup()

Overall_top5
```


Below code gives top 5 countries by gdpPercap  of each continent across the years 

```{r}
gap_longer %>% 
  filter(
         country %in% (Overall_top5 %>% pull(country))) %>% 
  ggplot(aes(x = year, y = gdpPercap, color = country)) +
  geom_line() +
  facet_wrap(~continent) +
  theme_viny_bright() +
  theme(legend.position = "none",
        axis.text.x = element_text(angle = 90))

```

```{r}
Overall_top5 %>% select(country)
```



```{r}
gap_longer %>% 
  filter(year == 2019,
         country %in% (Overall_top5 %>% pull(country)))
```



```{r}
gap_longer %>% 
  filter(year == 2019,
         country %in% Overall_top5$country ) 

```





```{r}
gap_longer %>% 
  filter(
    year == 2019,
    country %in% (Overall_top5 %>% pull(country))
  )
```


```{r}
gap_longer %>% 
    filter(year == 2019, country %in% Overall_top5) 
```

```{r}
gap_longer %>% 
    filter(year == 2019, country %in% Overall_top5) %>% 
    pull(country)
```

```{r}
gap_longer %>% 
    filter(year == 2019, country %in% Overall_top5$country) %>% 
    select(country)
```


```{r}
top5_by_continents <- gap_longer %>% 
    filter(year == 2019, country %in% Overall_top5$country) %>% 
    pull(country)

top5_by_continents
```

```{r fig.height=10, fig.width=10}
gap_longer %>% 
  mutate(highlight_type = case_when(country %in% top5_by_continents ~ "Yes",
                                                 TRUE ~ "No"))  %>% 
  #filter(!is.na(continent)) %>% filter(!is.na(gdpPercap)) %>% #head()
  na.exclude %>% 
  ggplot() +
  geom_line(aes(x = year, y = gdpPercap, col = country), size = 1.1) +
  gghighlight(highlight_type == "Yes", 
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  facet_wrap(~continent) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 60),
        legend.position = "none")
```

```{r}
tax_rev %>% 
  mutate(highlight_type = case_when(country %in%
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>%
  ggplot() +
  geom_line(aes(x = year, y = tax_revnue_perc_of_gdp, col = as.factor(country)), size = 1.1) +
  gghighlight(highlight_type == "Yes", 
              unhighlighted_params = list(size = 1, colour = alpha("grey", 0.4))) +
  facet_wrap(~continent) +
  theme_minimal() +
  theme(axis.text.x = element_text(angle = 60),
        legend.position = "none")
```


```{r}
gap_longer %>% 
  mutate(highlight_type = case_when(country %in% top5_by_continents ~ "Yes",
                                                 TRUE ~ "No"))  %>% 
  #filter(!is.na(continent)) %>% filter(!is.na(gdpPercap)) %>% #head()
  na.exclude %>% summary()
```

```{r}
tax_rev %>% 
  mutate(highlight_type = case_when(country %in%
                                 c("India","Singapore","Malaysia","Norway",
                                   "Denmark","United States","United Kingdom","China") ~ "Yes",
                               TRUE ~ "No")) %>%
  summary()
```


# plotly highlight charts

from: 

https://stackoverflow.com/questions/64385240/is-there-a-way-to-have-a-highlighted-chart-as-well-as-have-interactivity-of-sele?noredirect=1#comment113856801_64385240

https://plotly-r.com/client-side-linking.html#filter

```{r}
library(plotly)
```


```{r}
# from ggplot2 library

data("txhousing")
```


```{r}
txhousing %>% glimpse()
```

```{r}
txhousing %>%  head()
```


```{r}
tx <- highlight_key(txhousing, ~city)
```

```{r}
base <- plot_ly(tx, color = I("grey")) %>% 
  group_by(city)

```


```{r}
time_series <- base %>% 
                  group_by(city) %>% 
                  add_lines(x = ~date, y = ~median)
```


```{r}
highlight(
  time_series,
  on = "plotly_hover",
  selectize = FALSE,
  dynamic = FALSE,
  color = "red",
  persistent = FALSE
)
```


```{r}
plotly_1 <- gap_longer %>% 
  filter(continent == "Asia") %>% 
  na.exclude() %>% 
  
  plotly::highlight_key(., ~country)
```


```{r}
base <- plot_ly(plotly_1, color = I("grey")) %>% 
  group_by(country)

```


```{r}
time_series <- base %>% 
              group_by(country) %>% 
              add_lines(x = ~year, y = ~gdpPercap)
```


```{r}
highlight(
  time_series,
  on = "plotly_hover",
  selectize = FALSE,
  dynamic = FALSE,
  color = "red",
  persistent = FALSE
)
```


```{r}
plotly_1 <- gap_longer %>% 
  filter(continent == "Asia", gdpPercap < max(20000)) %>% 
  na.exclude() %>% 
  
  plotly::highlight_key(., ~country)
```


```{r}
base <- plot_ly(plotly_1, color = I("grey")) %>% 
  group_by(country)

```


```{r}
tme_series <- base %>% 
              group_by(country) %>% 
              add_lines(x = ~year, y = ~gdpPercap)
```


```{r}
highlight(
  time_series,
  on = "plotly_click",
  selectize = TRUE,
  dynamic = TRUE,
  color = "red",
  persistent = TRUE
)
```

```{r}
hist <- add_histogram(
  base,
  x = ~gdpPercap,
  histnorm = "probability density"
)

subplot(time_series, hist, nrows = 2) %>% 
  layout(barmode = "overlay", showlegend = FALSE) %>% 
  highlight(
    dynamic = TRUE,
    selectize = TRUE,
    color = "red",
    selected = attrs_selected(opacity = 0.3)
  )

```





### Trying to subtract row wise

```{r}
gapminder_new %>% 
  filter(country == c("India","Bangladesh"))
```

#### failed attempts

```{r}
gapminder_new %>% 
  filter(country == c("India","Bangladesh")) %>% 
  .[["India",]] - .[["Bangladesh",]]
```

```{r}
gapminder_new %>% 
  filter(country == c("India","Bangladesh")) %>% 
  .["India",] - .["Bangladesh",]
```


```{r}
gapminder_new %>% 
  filter(country == c("India","Bangladesh")) %>% 
  .[country == "India",] - .[country == "Bangladesh",]
```


```{r}
gapminder_new %>% 
  filter(country == c("India","Bangladesh")) %>% 
  .[India,] - .[Bangladesh,]
```


```{r}
gapminder_new %>% 
  filter(country == c("India","Bangladesh")) %>% 
  .[[India,]] - .[[Bangladesh,]]
```


```{r}
gapminder_new %>% 
  filter(country == c("India","Bangladesh")) %>% 
  mutate(Diff_result = (. %>% filter(country == "India") ) - (. %>% filter(country == "Bangladesh"))  )
```

```{r}
gapminder_new[country == "India",] - gapminder_new[country == "Bangladesh",]
```

```{r}
gapminder_new[India,] - gapminder_new[Bangladesh,]
```

```{r}
gapminder_new %>% 
  filter(country == "India")
```

```{r}
rownames(gapminder_new[country == "India",])
```

```{r}
rownames(gapminder_new[country == India,])
```


```{r}
gapminder_new[country == "India",]
```

```{r}
gapminder_new
```


```{r}
rownames(gapminder_new) <- gapminder_new$country
```

```{r}
gapminder_new %>%  head()
```

```{r}
gapminder_new["India", 2: ncol(gapminder_new)] #- gapminder_new["Bangladesh", ]
```

```{r}
gapminder_new[, 2:ncol(gapminder_new)]
```

#### solution from stackoverflow

https://stackoverflow.com/questions/64410966/how-to-subtract-a-row-from-another-row-in-r

```{r}
gapminder_new %>% 
  filter(country %in% c("India","Bangladesh")) %>% 
  select(-1) %>% 
  mutate(across(everything(), ~lead(.x) - (.x))) %>% na.omit()
```


```{r}
gapminder_new %>% select(-1) %>% mutate(across(everything(), ~lead(.x) - (.x))) %>% na.omit()
```



```{r}
gapminder_new %>% 
  filter(country %in% c("India","Bangladesh"))
```

#### My own solution

```{r} 
test_set <- as.data.frame(gapminder_new)

rownames(test_set) <- test_set$country

head(test_set)
```

```{r}
test_set %>%  select(-country)

test_set["India",2:ncol(test_set)] - test_set["Bangladesh",2:ncol(test_set)]
```

### setting toolips / highcharter

from: https://jkunst.com/blog/posts/2019-02-04-using-tooltips-in-unexpected-ways/

```{r}
library(highcharter)
```

#### Series chart

```{r}
gp <- gapminder %>% 
  arrange(desc(year)) %>% 
  distinct(country, .keep_all = TRUE)

head(gp)
```


```{r}
gp2 <- gapminder %>% 
  select(country, year, pop) %>% 
  nest(-country) %>% 
  mutate(
    data = map(data, mutate_mapping, hcaes(x = year, y = pop), drop = TRUE),
    data = map(data, list_parse)
  ) %>% 
  rename(ttdata = data)

gp2
```


```{r}
gptot <- left_join(gp, gp2, by = "country")

head(gptot)
```

```{r}
hchart(
  gptot,
  "point",
  hcaes(x = lifeExp, y = gdpPercap, name = country, 
        size=pop, group=continent, name=country)
) %>% 
  
  hc_yAxis(type = "logarithmic") %>% 
  
  # this is what creates a chart in tooltip
  hc_tooltip(
    useHTML = TRUE,
    headerFormat = "<b>{point.key}</b>",
    pointFormatter = tooltip_chart(accesor = "ttdata")
  ) %>% 
  
  hc_title(text = "Tooltip chart within a Chart") %>% 
  hc_subtitle(text = "(ttchart: population growth)")
```  
  
##### log

```{r}
gp2_log <- gapminder %>% 
  select(country, year, pop) %>% 
  nest(-country) %>% 
  mutate(
    data = map(data, mutate_mapping, hcaes(x = year, y = log(pop)), drop = TRUE),
    data = map(data, list_parse)
  ) %>% 
  rename(ttdata_log = data)

gp2_log
```


```{r}
gptot_log <- left_join(gp, gp2_log, by = "country")

head(gptot_log)
```


```{r}
hchart(
  gptot_log,
  "point",
  hcaes(x = lifeExp, y = gdpPercap, name = country, 
        size=pop, group=continent, name=country)
) %>% 
  
  hc_yAxis(type = "logarithmic") %>% 
  
  # this is what creates a chart in tooltip
  hc_tooltip(
    useHTML = TRUE,
    headerFormat = "<b>{point.key}</b>",
    pointFormatter = tooltip_chart(accesor = "ttdata_log")
  ) %>% 
  
  hc_title(text = "Tooltip chart within a Chart") %>% 
  hc_subtitle(text = "(ttchart: log population growth)")
``` 

#### donut chart

from: https://jkunst.com/blog/posts/2019-02-04-using-tooltips-in-unexpected-ways/

```{r}
donutdata <- gp %>% 
  group_by(continent) %>% 
  summarise(pop = sum(pop/1e6) * 1e6)

donutdata
```

```{r}
hchart(donutdata, "pie",
       hcaes(name = continent, y = pop), innerSize = 300)
```


```{r}
donutdata2 <- 
  gp %>% 
  select(continent, lifeExp, gdpPercap) %>% 
  nest(-continent) %>% 
  mutate(
    data = map(data, mutate_mapping, hcaes(x = lifeExp, y = gdpPercap), drop = TRUE),
    data = map(data, list_parse)
  ) %>% 
  rename(ttdata = data) %>%
  left_join(donutdata)

donutdata2
```

```{r}
hc <- hchart(
  donutdata2, "pie", hcaes(name = continent, y = pop),
  innerSize = 375
)

hc
```


```{r}
hc %>% 
  hc_tooltip(
    useHTML = TRUE,
    headerFormat = "<b>{point.key}</b>",
    pointFormatter = tooltip_chart(
      accesor = "ttdata",
      hc_opts = list(
        chart = list(type = "scatter"),
        credits = list(enabled = FALSE),
        plotOptions = list(scatter = list(marker = list(radius = 2)))
        ),
      height = 225
      ),
    positioner = JS(
      "function () {
      
        /* one of the most important parts! */
        xp =  this.chart.chartWidth/2 - this.label.width/2
        yp =  this.chart.chartHeight/2 - this.label.height/2
      
        return { x: xp, y: yp };
      
      }"),
    shadow = FALSE,
    borderWidth = 0,
    backgroundColor = "transparent",
    hideDelay = 1000
  )
```





































